from paddleocr import PaddleOCR
from preprocess.file_paser.paser_utils import traverse_dir, re_filter
import json
import os

# need to run only once to download and load model into memory
print("对图片进行OCR处理：")
ocr = PaddleOCR(use_angle_cls=True, lang="ch")
img_path = r'D:\Users\JHC258\projects\文本检索\preprocess\images\pdf_2_19_0.png'
result = ocr.ocr(img_path, cls=True)
print()
